package docsim;

/**
 * String constants used by topic mode algorithm
 * @author oraut
 *
 */
public class CONSTANTS
{
    /*
     * Regular expressions
     */
    public static final String                 PUNCTUATION_REGEX = "[^a-zA-Z0-9]";
    public static final String                 REGEX_BRACES = "<.+?>";
    public static final String                 REGEX_NUMBERS = "\\d+[^a-zA-Z0-9]*";
    public static final String                 REGEX_SPACE = "\\s+" ;
    public static final String                 REGEX_SHORT_WORDS = "\\b[\\w]{1,2}\\b";
    public static final String                 REGEX_BACKSLASH = "\\\\";
    public static final String                 REGEX_FORWARDSLASH = "/";
    
    /*
     * Other constants
     */
    public static final String                 CHAR_SPACE = " ";
    public static final String                 URI_FILE_STRING = "file://";
    public static final String                 STRING_EMPTY = "";
    
    public static void main(String[] args) {
		String s = "121 2131 omkar asda 41234 1valid1";
		System.out.println(s.replaceAll(REGEX_NUMBERS, "_"));
	}
}
